Research Guide




Logical

# dgf.logical <- dgf[14:15,  ]
create_all_sections( dgf.log )

F9_05_UBIZ_IMCOME_OVER_LIMIT_X

LABEL: F9_05_UBIZ_IMCOME_OVER_LIMIT_X

DATA TYPE: logical

DESCRIPTION: Had unrelated business gross income of $1,000 or more [x]

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 2
Most Common Value N (86%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 0 (0%)
Infinite 0 (0%)

VALUES:

Value Frequency
N 21550
Y 3450

BOOLPLOT:

OUTNCCS

LABEL: OUTNCCS

DATA TYPE: logical

DESCRIPTION: Out of Scope flag

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 3
Most Common Value IN (100%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 2361 (9.4%)
Infinite 0 (0%)

VALUES:

Value Frequency
IN 22600
NA 2361
OUT 39

BOOLPLOT:

Factor

# dgf.factor <- dgf[6:13,  ]
create_all_sections( dgf.fact )

SUBSECCD

LABEL: SUBSECCD

DATA TYPE: factor

DESCRIPTION: IRS subsection code

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 23
Most Common Value 6 (26%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 0 (0%)
Infinite 0 (0%)

MOST COMMON VALUES:

Value Frequency
6 6391
4 4936
7 3571
5 3449
8 1479
19 1459

TREEMAP:

BMF_ACTIV1

LABEL: BMF_ACTIV1

DATA TYPE: factor

DESCRIPTION: IRS Activity Code 1

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 230
Most Common Value 0 (25%)
Zero 5807 (23.2%)
All Empty 0 (0%)
Missing/NA 1887 (7.5%)
Infinite 0 (0%)

MOST COMMON VALUES:

Value Frequency
0 5807
263 1782
200 1648
907 1212
36 1054
279 998

TREEMAP:

NTMAJ12

LABEL: NTMAJ12

DATA TYPE: factor

DESCRIPTION: NTEE major group (12)

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 12
Most Common Value PU (37%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 0 (0%)
Infinite 0 (0%)

MOST COMMON VALUES:

Value Frequency
PU 9128
HU 7955
MU 2480
ED 1528
UN 1524
HE 994

TREEMAP:

NTEE1

LABEL: NTEE1

DATA TYPE: factor

DESCRIPTION: NTEE major group

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 27
Most Common Value S (25%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 1497 (6%)
Infinite 0 (0%)

MOST COMMON VALUES:

Value Frequency
S 5817
N 3018
W 2835
Y 2480
J 1961
B 1552

TREEMAP:

NTEEFINAL

LABEL: NTEEFINAL

DATA TYPE: factor

DESCRIPTION: NA

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 654
Most Common Value S41 (8%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 1497 (6%)
Infinite 0 (0%)

MOST COMMON VALUES:

Value Frequency
S41 1947
J40 1815
W30 1582
S80 1515
N50 1088
M24 810

TREEMAP:

NTEESRC

LABEL: NTEESRC

DATA TYPE: factor

DESCRIPTION: NA

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 16
Most Common Value BEST (53%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 1378 (5.5%)
Infinite 0 (0%)

MOST COMMON VALUES:

Value Frequency
BEST 12410
WORD 4000
NEW 2621
IRS 2540
SOI 855
ZZ 454

TREEMAP:

DEDUCTCD

LABEL: DEDUCTCD

DATA TYPE: factor

DESCRIPTION: IRS Deductibility code

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 5
Most Common Value 2 (80%)
Zero 685 (2.7%)
All Empty 0 (0%)
Missing/NA 1887 (7.5%)
Infinite 0 (0%)

MOST COMMON VALUES:

Value Frequency
2 18494
1 3932
0 685
4 2

TREEMAP:

OUTREAS

LABEL: OUTREAS

DATA TYPE: factor

DESCRIPTION: Reason why out of scope

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 5
Most Common Value NA (NaN%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 24961 (99.8%)
Infinite 0 (0%)

MOST COMMON VALUES:

Value Frequency
T 15
F 12
S 11
N 1

TREEMAP:

F9_00_TAX_PERIOD_END_DATE

LABEL: F9_00_TAX_PERIOD_END_DATE

DATA TYPE: factor

DESCRIPTION: Tax period end date

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 47
Most Common Value 2019-12 (40%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 0 (0%)
Infinite 0 (0%)

MOST COMMON VALUES:

Value Frequency
2019-12 9884
2018-12 3477
2019-06 2064
2017-12 1626
2020-06 1312
2018-06 840

TREEMAP:

F9_00_TAX_PERIOD_END_DATE_PY

LABEL: F9_00_TAX_PERIOD_END_DATE_PY

DATA TYPE: factor

DESCRIPTION: Tax period end date - prior year

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 47
Most Common Value 2018-12 (45%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 4344 (17.4%)
Infinite 0 (0%)

MOST COMMON VALUES:

Value Frequency
2018-12 9298
2017-12 3002
2018-06 1767
2019-06 1060
2018-09 744
2017-06 539

TREEMAP:

F9_00_TAX_ACCPER

LABEL: F9_00_TAX_ACCPER

DATA TYPE: factor

DESCRIPTION: Tax period end date

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 12
Most Common Value 12 (60%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 0 (0%)
Infinite 0 (0%)

MOST COMMON VALUES:

Value Frequency
12 14987
06 4578
09 1251
03 849
05 796
08 688

TREEMAP:

Numeric

# dgf.num <- dgf[22:27,  ]
create_all_sections( dgf.num )

COUNTY_FIPS

LABEL: COUNTY_FIPS

DATA TYPE: numeric

DESCRIPTION: State + County FIPS code

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 2411
Most Common Value NA (NaN%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 2389 (9.6%)
Infinite 0 (0%)

STATS:

STAT VAL
Minimum 1,001
Q - 05 6,019
Q - 25 17,027
Median 27,163
Mean 28,405.45
Q - 75 41,051
Q - 95 53,033
Maximum 78,030
Skew -0.01

HIST:

DATA PREVIEW:

26125 19153
6073 34003
42101 48201
26163 39035
4013 6059
48113 39049
36059 36061
18097 6001
25027 6037
36103 42003

CEO_CENSUSTRACT

LABEL: CEO_CENSUSTRACT

DATA TYPE: numeric

DESCRIPTION: Census tract

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 14265
Most Common Value NA (NaN%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 3110 (12.4%)
Infinite 0 (0%)

STATS:

STAT VAL
Minimum 1,001,020,500
Q - 05 6,029,003,250
Q - 25 17,031,320,100
Median 28,012,950,350
Mean 28,488,147,053
Q - 75 41,051,008,202
Q - 95 53,033,008,055
Maximum 5.6043e+10
Skew -0.02

HIST:

DATA PREVIEW:

48453000102 36061016100
6073020809 11001010100
11001006202 6075061500
48113020300 51510201900
11001010700 18097391000
17031320100 28049010500
350 6085512100
11001005900 22033003501
48453001100 42003191100
48201531700 6075011700

F9_08_REV_TOT_TOT

LABEL: F9_08_REV_TOT_TOT

DATA TYPE: numeric

DESCRIPTION: Total revenue - total

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 23817
Most Common Value 0 (2%)
Zero 413 (1.7%)
All Empty 0 (0%)
Missing/NA 0 (0%)
Infinite 0 (0%)

STATS:

STAT VAL
Minimum -61,467,591
Q - 05 3,359.8
Q - 25 51,012.5
Median 130,545
Mean 3,740,777
Q - 75 441,954.5
Q - 95 6,355,357
Maximum 4,178,522,311
Skew 44.03

HIST:

DATA PREVIEW:

1500 19611
1800 50
48000 4125
600 5000
25500 26873
1000 5400
10000 4
100 2000
101225 9465
1e+05 575

F9_10_ASSET_TOT_BOY

LABEL: F9_10_ASSET_TOT_BOY

DATA TYPE: numeric

DESCRIPTION: Total assets - beginning of year

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 20195
Most Common Value 0 (13%)
Zero 3011 (12%)
All Empty 0 (0%)
Missing/NA 1377 (5.5%)
Infinite 0 (0%)

STATS:

STAT VAL
Minimum -69,049
Q - 05 0
Q - 25 31,558.5
Median 169,734
Mean 11,116,959
Q - 75 729,844.5
Q - 95 13,488,117
Maximum 11,226,543,829
Skew 41.82

HIST:

DATA PREVIEW:

300 21915
3087 343
4612 1535
20855 388
212 4412
1642 1593
1222 3708
10571 8302
1020 3073
1000 3068

F9_10_ASSET_TOT_EOY

LABEL: F9_10_ASSET_TOT_EOY

DATA TYPE: numeric

DESCRIPTION: Total assets - end of year

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 24122
Most Common Value 1 (1%)
Zero 110 (0.4%)
All Empty 0 (0%)
Missing/NA 0 (0%)
Infinite 0 (0%)

STATS:

STAT VAL
Minimum -1,119,570
Q - 05 4,421.45
Q - 25 55,668.25
Median 212,649
Mean 13,755,826
Q - 75 837,286
Q - 95 14,639,755
Maximum 38,468,314,242
Skew 85.67

HIST:

DATA PREVIEW:

680 1374
1203 21
415 663
1383 30
478 1107
480 529
90 0
459 997
10000 1932
2280 1158

F9_10_NAFB_TOT_BOY

LABEL: F9_10_NAFB_TOT_BOY

DATA TYPE: numeric

DESCRIPTION: Net assets or fund balances - beginning of year

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 20145
Most Common Value NA (NaN%)
Zero 203 (0.8%)
All Empty 0 (0%)
Missing/NA 4344 (17.4%)
Infinite 0 (0%)

STATS:

STAT VAL
Minimum -333,005,908
Q - 05 1,659.5
Q - 25 52,689.5
Median 192,629.5
Mean 4,921,982
Q - 75 720,262.5
Q - 95 10,744,071
Maximum 6,323,689,488
Skew 61.69

HIST:

DATA PREVIEW:

0 8311
9369 8942
4412 4414
9110 24587
9527 20855
5619 2870
97 4612
3708 3068
5318 8853
-21474 1547

F9_09_EXP_TOT_TOT

LABEL: F9_09_EXP_TOT_TOT

DATA TYPE: numeric

DESCRIPTION: Total functional expenses - total expenses

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 23740
Most Common Value 0 (2%)
Zero 489 (2%)
All Empty 0 (0%)
Missing/NA 0 (0%)
Infinite 0 (0%)

STATS:

STAT VAL
Minimum -11,719
Q - 05 3,886.95
Q - 25 46,845
Median 121,792.5
Mean 3,531,376
Q - 75 411,837.2
Q - 95 5,832,724
Maximum 4,256,605,589
Skew 46.21

HIST:

DATA PREVIEW:

80427 539
261 60157
225 500
83437 588
10 10000
153299 25
129 175
400 83368
45638 397
62391 16927

F9_01_EXP_TOT_PY

LABEL: F9_01_EXP_TOT_PY

DATA TYPE: numeric

DESCRIPTION: Total expenses - prior year

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 19931
Most Common Value 0 (14%)
Zero 3257 (13%)
All Empty 0 (0%)
Missing/NA 1377 (5.5%)
Infinite 0 (0%)

STATS:

STAT VAL
Minimum -5,437,471
Q - 05 0
Q - 25 29,933
Median 102,618
Mean 3,407,085
Q - 75 362,012.5
Q - 95 5,357,595
Maximum 4,624,922,368
Skew 48.26

HIST:

DATA PREVIEW:

10 5853
44039 25853
5640 3200
56378 3400
5000 736
2505 3433
0 20
5791 7500
7268 656
2489 7393

Character

# dgf.chr <- dgf[c(1:5, 20),  ]
create_all_sections( dgf.chr )

F9_00_ORG_NAME_L1

LABEL: F9_00_ORG_NAME_L1

DATA TYPE: character

DESCRIPTION: Organization name line 1

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 17455
Most Common Value NA (NaN%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 1378 (5.5%)
Infinite 0 (0%)

PREVIEW:

AMERICAN FEDERATION OF TEACHERS INTERNATIONAL BROTHERHOO
AMERICAN LEGION KIWANIS INTERNATIONAL INC
BENEVOLENT & PROTECTIVE ORDER OF ELKS OF THE USA KNIGHTS OF COLUMBUS
FRATERNAL ORDER OF EAGLES ROTARY INTERNATIONAL
INTERNATIONAL ASSOCIATION OF FIRE FIGHTERS UNITED STEELWORKERS
INTERNATIONAL ASSOCIATION OF LIONS CLUBS VETERANS OF FOREIGN WARS OF THE UNITED STATES DE

STATS:

STAT CHARACTERS WORDS
Minimum 3 1
Median 34 5
Mean 35.64 5.08
Max 97 17
Skew 0.43 0.94

Word Cloud:

F0_00_ORG_CONTACT

LABEL: F0_00_ORG_CONTACT

DATA TYPE: character

DESCRIPTION: Contact person (from IRS files)

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 10990
Most Common Value NA (NaN%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 13392 (53.6%)
Infinite 0 (0%)

PREVIEW:

AGRECORDS POST QUARTERMASTER
AIPSO PRESIDENT
BOARD OF TRUSTEES QUARTERMASTER
BRIANNE TILLOTSON SCIARABBA WALKER
COMMANDER SECRETARY
COMMERCE SECRETARY TREASURER
CREST MANAGEMENT SORORITY SOLUTIONS
FINANCIAL SECRETARY THE BANK OF NEW YORK MELLON
GEO THE ORGANIZATION
MIDAMERICA RET & ADMIN SOL INC TREASURER
PEO TREASURER WORTHY SECRETARY

STATS:

STAT CHARACTERS WORDS
Minimum 1 1
Median 14 2
Mean 15.02 2.49
Max 33 9
Skew 1.29 1.63

Word Cloud:

F9_00_ORG_ADDR_L1

LABEL: F9_00_ORG_ADDR_L1

DATA TYPE: character

DESCRIPTION: Organization street address line 1

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 18785
Most Common Value NA (NaN%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 1378 (5.5%)
Infinite 0 (0%)

PREVIEW:

1154 TOWN AND COUNTRY COMMONS DR PO BOX 24
3700 GRAND AVE PO BOX 250
695 PRO MED LN STE 300 PO BOX 26
9717 ELK GROVE FLORIN RD STE B PO BOX 37
PO BOX 1 PO BOX 4
PO BOX 111 PO BOX 40
PO BOX 123 PO BOX 5
PO BOX 151 PO BOX 535007
PO BOX 175 PO BOX 6
PO BOX 187 PO BOX 66
PO BOX 2 PO BOX 8
PO BOX 217 PO BOX 86
PO BOX 23 PO BOX 9

STATS:

STAT CHARACTERS WORDS
Minimum 2 1
Median 15 3
Mean 16.04 3.75
Max 35 9
Skew 0.97 1.42

Word Cloud:

F9_00_ORG_ADDR_CITY

LABEL: F9_00_ORG_ADDR_CITY

DATA TYPE: character

DESCRIPTION: Organization city

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 5986
Most Common Value NA (NaN%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 1378 (5.5%)
Infinite 0 (0%)

PREVIEW:

ALBANY LOS ANGELES
ALEXANDRIA LOUISVILLE
ATLANTA MADISON
AUSTIN NEW YORK
BOSTON PHILADELPHIA
CHICAGO PHOENIX
CLEVELAND PITTSBURGH
COLUMBIA PORTLAND
COLUMBUS RICHMOND
DALLAS SACRAMENTO
DENVER SAINT LOUIS
HONOLULU SAN DIEGO
HOUSTON SAN FRANCISCO
INDIANAPOLIS SEATTLE
LAS VEGAS SPRINGFIELD
LEXINGTON WASHINGTON

STATS:

STAT CHARACTERS WORDS
Minimum 3 1
Median 9 1
Mean 8.69 1.26
Max 22 4
Skew 0.23 1.46

Word Cloud:

EIN

LABEL: EIN

DATA TYPE: character

DESCRIPTION: EIN

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 24794
Most Common Value 020212092 (0%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 0 (0%)
Infinite 0 (0%)

PREVIEW:

010100593 010874048
010218055 010961458
010220588 016011483
010266289 016012302
010273431 016019950
010286963 016022337
010440702 016123853
010468398 020172119
010523313 020187390
010524078 020212092
010573723 020232424
010715375 020241397
010744517 020257793
010815981 020324779
010852125 020349390

STATS:

STAT CHARACTERS WORDS
Minimum 9 1
Median 9 1
Mean 9 1
Max 9 1
Skew Skew Skew

Word Cloud:

F9_00_TAX_PERIOD_BEGIN_DATE

LABEL: F9_00_TAX_PERIOD_BEGIN_DATE

DATA TYPE: character

DESCRIPTION: Tax period begin date

PROPERTIES:

STAT VAL PER
Rows 25000
Distinct 12
Most Common Value 2019-0 (41%)
Zero 0 (0%)
All Empty 0 (0%)
Missing/NA 0 (0%)
Infinite 0 (0%)

PREVIEW:

2016-9 2018-9
2017-0 2019-0
2017-1 2019-1
2017-9 2019-9
2018-0 2020-0
2018-1 2020-1

STATS:

STAT CHARACTERS WORDS
Minimum 6 1
Median 6 1
Mean 6 1
Max 6 1
Skew Skew Skew

Word Cloud: